import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

path_data = "pima-indians-diabetes.csv"
train = pd.read_csv(path_data)
print(train.head())
print("train: ", train.shape)
print(train.info())
NaN_col_names =  ['Plasma_glucose_concentration','blood_pressure','Triceps_skin_fold_thickness','serum_insulin','BMI']
print((train[NaN_col_names]==0).sum())














